# 并行化创建RDD
#coding:utf8
from pyspark import SparkContext,SparkConf

if __name__ == '__main__':
    conf = SparkConf().setAppName("test").setMaster("local[*]")
    sc = SparkContext(conf=conf)

    rdd = sc.parallelize([1,2,3,4,5,6,7,8,9])
    print("默认分区数是：",rdd.getNumPartitions())

    rdd = sc.parallelize([1,2,3,4,5,6,7,8,9],3)
    print("分区数是：",rdd.getNumPartitions())

    print("rdd的内容是：",rdd.collect())